## distribute threads to all numa node evenly.
#export OMP_PROC_BIND=spread
#export OMP_PLACES=cores
#export OMP_NUM_THREADS=80
#./stream_c.exe

##
export OMP_NUM_THREADS=20
#numactl --cpunodebind=0 ./stream_c.exe


numactl --cpunodebind=1 --membind=2 ./stream_c.exe
#./stream_c.exe
